from lxml import etree

if __name__ == '__main__':
    # 解析文件中的内容，并指定解析器
    xml = etree.parse(source="hello.html", parser=etree.HTMLParser())
    print(etree.tounicode(xml, pretty_print=True))

